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APPENDIX I: Sample Java Source Code 

// Java class function to analyse a series of link 

// directors 

// Author: David Siegel 

// 

import java.util - 
import java.io.*; 
import java.lang.*; 

import Folder; 
import Directory; 
import Permutation; 

class Analyze { 
Directory _dir? 
Folder JL ; 
doublet] _re suits; 

// Constructor that creates an instance of the analyze 
// class. We pasB in the directory tree that contains 
// all link folders in che system and a folder to be 
// matched against the directory, 
public Analyze (Directory dir, Polder f) { 

_dir » dir; 

_f « f; 

_results - new double (1000] ; 

ine i; 

for (i=0; iclOOO; !*•+) 
resulted] - 0.0; 

].• 

// Compute all combinations of the folder given in the 
// analyse contructor and run the matching algorithm on 
//each. We take all combinations of m links taken n 
// at a time, where m is the number of links in the 
// exemplar folder and n ranges from m to l. 
public Polder permute (double thresh, int level) { 

int[] x = _f . toArrayO 

int n « f .count () ; 

int i; ~ 

// This bootstraps the combination process by calling 
// the combination helper routine ones for each m 
// (where m is the number of items being considered 
// in the combination, as described above, 
for (ion-1; i>0; 1--) { 

intt) p = new int [i] ; 

doPerraute (p, x, n, i, i) ; 

} 

Folder folder = new Folder () ; 

//We build a folder here with the summary results 
// from all matches that we found by running the 
// above permutation. Note that we only include 
// matches that exceed a given score threshold , as 
// specified in an argument to this routine, we 
// weight the score by the "level**, where level is 
// the number of times the routine was reinvoked on 
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// its own results. This is how indirect 
// relationships are found, 
for (ioO; i<1000; i++> { 

double v » _resultsli] / < double) level ; 
if <(v > 0)~&& !_f .contains (i) > { 

System, out . print In <i + n > ■ + v) 

if (v > thresh) 

folder. addliink(i) ; 

} 

} 

return folder; 

}; 

// This method does the work of the matching process. 
// The actual combinations m at a time are computed 
// here, recursively. The cumulative result score is 
// also computed. 
// 

// Arguments to the routine: 
// p: accumulated permutations 
// x: input array 
// n: length of input array 
// m: remaining count to permute 
// c: total length of permutation 
private void doPermute (int [] p, int[] x, int n, 
int m. int c) 

{ 

int i, j; 

// Create a copy of the input link list omitting one 
// link at a time. This is done to compute the 
// combinations of links, 
for (i*0; i<n; i++) { 

int I J xCopy « new inttn-1]; 
for <j-0; j<n-l; { 
if (j<i) 

xCopy(j] - x[j] ; 
else 

xCopy [j] = xlj+i] ; 

} 

// Build the new combination of links to be 
// considered. 
p[m-l] ~ xti] ; 

//If the length of the remaining links to be added 
// to the combination is greater than one, invoke 
// the routine recursively to add the remaining 
// links to the combination. If not, we've got a 
// combination and are ready to compute a score, 
if <m > 1) { 

doPermute <p, xCopy, n-1, m-1, c) ; 
} else { 

// Build a link folder from the combination. 
Polder f - new Folder <p, c) ; 

// Match this folder against the directory tree, 
// looking for all folders that contain this 
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// exact set of links. 

Directory. Result rc - _dir . finds imilar (f) ; 

// Create a score weighting factor. Here, c is the 
// total length of the permutation and _f. count () is 
// the total length of the initial exemplar 
// provided. Thus, the more links from the original 
// exemplar provided that are in this combination, 
// the greater the score. 

double factor « (double) c/ (double) _f .count () ; 

// Now scan all matches and record the scores for 
// each link. Only keep .the highest score, since 
// the link could be find in more than one of the 
// combination passes through this routine, 
int k; 

for <k-0; k<1000; k+-#-> { 

double v o (rc . folders [k] * factor) /rc . total; 
if (v > ^results [k] ) 
_results [k] » v; 

} 



}; 

// Print a summary of the results. 

public int printStats (Folder folder, int results [] , 
int total, double factor) 

{ 

int i; 

for <i=0; i<1000; i++) { 
if (results [i) > 0) 

System. out. print In ("Pound • " + i + " 1 " + 
results [i) + ** times (■ + 

((float) results [i)*f actor)/ (float) total + ">"); 

) 

return total; 

}; 

// Helper function to print an array, 
public void pr int Array (int [] array, int count) { 
int i; 

for (ioO ; i< count i++) 

System. out .print (array [i] ♦ ") ; 
System, out . print In () ; 

}; 

} 

// 

// Java functions to manipulate a system wide directory 

// of link folders. 

// Author: David Siegel 

// 

import java -util . * ,- 
import j ava . io . * ; 
import j ava . lang . * ; 

import Polder ; 
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class Directory { 

private Folder!) _f olders; 
private int _al located; 
private int _inUse; 

// Create an empty directory (limit ted to 10 00 link folders for now) . 
public Directory I) { 

_f olders - new Folder [1000] ; 

_al located - 1000; 

_inUse = 0; 

); 

// Add a folder from a string to the system wide folder 
// directory. 

public int addPolder (String s) { 
Folder f « new Folder ( ) ; 
f .addLinks <s> ; 
return addFolder <f > ; 

>.- 

// Add a folder from a folder class to the system wide 

// folder directory. 

public int addFolder (Folder f) { 

_f olders [_inUsel - f; 

return _inUse++; 

); 

// Count the number of times all links in an exemplar 
// folder match against folders in the system wide 
// directory. 

public int match (Folder exemplar) { 
int count = 0; 
int ij 

for (i»0; i<_inUse; i++) { 

if (_f olders [i] .match (exemplar) ) 
count 

» 

return count; 

>; 

// Helper class that is the return value of the next 
// function, 
class Result { 

int (] folders; 

int total; 

}; 

// This function takes an exemplar folder as an input, 
// and return an array that counts how many times each 
// link in the exemplar appears in the directory. For 
// example, folders Ci] of the result contains the count 
//of how many times link i matched against all the 
// links in the directory. 

public Result findSimilar (Folder exemplar) { 
int results [] - new int (10001; 
int matches » 0; 
int i; 
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// Xnitalize the return result counts to 0. 
for (1=0; i<1000; 
results [i] « 0; 

// For each folder in the system, see if we have 
// matches against the exemplar. If we do, add one 
// to the count for a match for a link each time a 
// match has been found, 
for li=0; i<_inUse; { 

if <_folders til .match (exemplar) ) { 
matches**; 

Enumeration el ems =» _f older a [i ] . Keys ( ) ; 
whi le ( elems . ha slioreE lenient s ( ) ) { 

Integer link o (integer) elems .next Element () ; 

if ( J exemplar .contains (link) ) 
results (link, int Value () ] ++; 

} 

} 

} 

// Build and return the results. 
Result rc « new Result (); 
rc. folders a results; 
rc. total - matches; 
return rc; 

}; 
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// 

// Java functions to manipulate a link folder. 

// Author: David Siegel 

// 

import java.util.*; 
import j ava . io . * ; 
import j ava . 1 ang . * ; 

class Folder { 

private Hashtable _f older ; 

// Constructor to create an empty link folder, 
public Folder 0 { 

_f older = new Hashtable () ; 

}; 

// Constructor to create a link folder from a string 
// listing the links in the folder, 
public Folder (String linkString) { 

_f older - new Hashtable <) ; 

addLinks (linkString) ; 

); 

// constructor to create a link folder from an array, 
// where only the links that have a score greater than 
// the given threshold are added to the link folder, 
public Folder (int I) linkArray, int divisor, 
double thresh) 

{ 

int i; 

_f older = new Hashtable < ) ; 
for (i-0; i<1000; i++) { 

if ( (double) linkArray [i]/ (double) divisor > thresh) 
_f older. put (new Integer < (int) i ) , ""); 

} 

}; 

// Constructor to create a link folder from an array, 
public Folder (int [] array , int count) { 
int i; 

_f older o new Hashtable ( ) / 
for (i-0; i<count; i ++) { 

_folder .put (new Integer ( (int ) array [i] ) , *») ; 

) 

}; 

// Return the links in the folder, 
public Enumeration keys ( ) { 
return folder . keys ( ) ,- 

}; 

// Add a bunch of links in string format to a folder, 
public int addLinks (String linkString) { 
Reader in; 

in « new St ringReader (linkString) 

StreamTokeni2er parser « new StreamTokenizer (in) ; 
try { 
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whi le (parser . nexCToken ( ) ! = 

s t r eamTokeni ze r . TT_EOF > 

< 

switch (parser . ttype) { 
case St reamTokeni zer . TT_EO L : 
break ? 

case St reamTokeni ze r . TT_ NUMBER : 

_folder.put (new Integer ( (int) parser .nval) , t "*) ; 
break; 

} 

} 

) catch (IOBxception e) { 
return -1 ; 

) 

return 0; 

>* 

// Method to add a link to the folder, 
public void addLinMint link) { 

folder. put (new Integer < (int ) link) , ""); 

} 

// Determine if the folder contains a given link, 
public boolean contains (int link) { 

return _f older. containsKey (new Integer (link) ) ; 

}; 

// Same as above for Integer type, 
public boolean contains (Integer link) { 
return _f older .containsKey (link) ; 

}; 

// Determine if an example folder matches the given 
// folder. 

public boolean match (Folder exemplar) { 

Enumeration elems « exemplar ._f older, keys () ; 
boolean found = true , 

// Iterate through all the links in the exemplar and 
// make sure each and every one is in the folder, 
while (elems .hasMoreEl entente ( ) ) { 

Integer link (Integer) elems . nextElement () ; 
if ('.contains (link. intValueO)) { 
found => false; 
break ; 

) 

} 

// Return true if we have a match, 
return found; 

}.• 

// Determine if an example folder matches the given 
// folder. 

public void print () { 

Enumeration elems «= _f older . keys () ; 
whi le (elems . hasMoreElements ( ) ) { 

Integer link = (Integer) elems .nextBlement () ; 
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System. out .print (link -t- " n ) ; 

} 

System. out . println () ; 

>; 

// Convert to an array, 
public int [} toArrayO { 

int {] array = new int [_f older . eize ()] ; 

Enumeration elems = f older . keys <) ; 

int i o 0; 

while (elems . hasMoreElements ( ) ) { 

Integer link « ( Integer )e lews .next Element () ; 
array[i++] « link, int Value () ; 

} 

return array; 

}; 

// Return the number of links in the folder, 
public int count () { 
return _f older. size () ; 

b 
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// 

// Main, test harness for the link matching algorithms. 
// Author: David Siegel 

// 

import java.util.*; 
import j ava . io . * ; 
import java . lang - * ; 

import Folder; 
import Directory; 
import Analyze 

class Main { 

public static void main(String argvf]) { 
Directory dir « new Directory () ; 

// Add a bunch of folders to the system directory. 
// Each number represents a link number. Each call 
//to addPolder adds a new folder. For the purposes 
//of this test we do not track the folder directory 
// structure or the folder owner. 



dir . addFolder ( 


"1 


2 


3 


5") ; 




dir. addPolder < 


["1 


2 


3 


5") ; 




dir . addFolder 4 


-1 


2 


3 


5") ; 




dir . addPolder \ 


"1 


2 


3 


7") ; 




dir . addPolder i 


"2 


2 


3 


7»> ; 




dir .addPolder 


"2 


2 


3 


9") ; 




dir. addFolder 4 


k n 2 


2 


3 


5") ; 




dir. addPolder 


'"1 


5 


9 


10") f 




dir. addPolder 


["1 


5 


9 


10") ; 




dir . addPolder 


I"l 


5 


9 


11") § 




dir . addFolder 


!"i 


5 


9 


11") ; 




dir . addFolder 


["l 


5 


9 


12") ; 




dir. addPolder 


["1 


5 


9 


12") ; 




dir . addFolder 


["l 


5 


9 


12") ; 




dir . addFolder 


I"l 


5 


9 


12") ; 




dir . addFolder 


1-1 


5 


9 


12°) ; 




dir . addFolder \ 


»l 


5 


9 


12") ; 




dir . addFolder \ 


"10 


11 


12 44" 


) 


dir . addFolder 


["12 


15 


19 23" 


) 


dir. addFolder 


["12 


15 


19 22" 


) 


dir . addFolder 


; n i2 


15 


19 22" 


) 


di r . addFolder 


;°i2 


15 


19 22" 


) 


dir . addPolder \ 


"12 


15 


19 22" 


) 


dir . addFolder 


:°i2 


15 


19 22" 


) 


dir . addFolder 


•12 




15 


19 22" 


) 


di r . addPolder 


"12 




15 


19 22" 


) 


dir . addFolder { 


"12 




15 


19 22" 


) 



// Perform the matching process with the specified 
// exemplar folder. Thus, the input to the matching 
// process is the system wide folder directory that 
// was created above, plus an exemplar folder. The 
// goal is to find links that are related to the 
// input exemplary. 
System. out . print In ("Level 1;"); 
Analyze study « new Analyze (dir, 

new Folder ("1 2 3 4 5 9")); 
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Folder f - study .permute (0 . 01, 1) ; 

// We now re invoke the matching algorithm on the 

// results of the first match. This is in essence a 

// level 2 match which finds indirectly related links 

// to the initially given exemplar. This process 

// could be repeated to find level 3, 4, etc. 

// relationships, though after a while the 

// relationships become too distant to be meaningful. 

System. out .print In < "Level 2:") ; 

study « new Analyze (dir, f ) ; 

study -permute (0.01 . 2); 
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/* $ld: RelatedUrl. j ava, v 1.4 Exp $ */ 

// Author: David Siegel 

// 

package BlinkUtil; 

import java.io.*; 

i mpor t j ava . lang . * ; 

import java.util.*; 

import java.util .Date ; 

import j ava. text.*; 

import java.sql.*; 

import java.sql . SQLBxcept ion ; 

public class RelatedUrl extends Url { 

private int _matchCount; 

public void finalize () throws Throwable { 
super .finalize () ; 

} 

public RelatedUrl (Session session* ResultSet rs> throws SQLException { 
super (session, rs) ; 

jmatchCoun t » rs . get Int ( "match_count " ) ; 

} 

public int matchCountO { 
re turn mat chCount ; 

> 

public void addMatchCount (RelatedUrl rurl) { 
jmatchCount +» rurl ._matchCount; 

} 

} 
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/* $Id: RelatedUrlDir. java,v 1.7 Exp $ */ 

// Author: David Siegel 

// 

package BlinkUtil; 

import java.io.*; 

i mport j ava . lang . * ; 

import java.util. 

import java.util .Date ; 

import j ava - text . * ; 

import java.eql.*; 

import java . sql . SQLException; 

public class RelatedUrlDir { 

Session _session; 
Hashtable _ht; 
RelatedUrl [J _rurlB; 

public void finalize 0 throws Throwable { 
super. finalize () ; 
^session = null; 
_ht = null; 
_rurls = null; 

} 

public RelatedUrlDir (Session session) { 
__session - session; 
_ht » null; 
_rurls m null; 

} 

public Session sessionO { 
return session; 

> 

public RelatedUrl [] items <) { 
return rurls; 

} 

public int sizeC) { 
if (_rurls null) 

return 0; 
else 

return _rur Is . length; 

) 

public void add (ResultSet rs) throws SQLException { 
RelatedUrl next = new RelatedUrl <_session, rs) ; 

RelatedUrl rurl «= (RelatedUrl) _ht . get (new integer (next .ur lid 0 )) ; 
if (rurl — null) 

_ht . put (new Integer (next . urlld ( ) ) , next > ; 
else 

rurl . addMat chCount (next ) ; 

) 

public void update (int dirld) throws SQLException, FatalBxception { 
_ht a new Hashtable ( ) ; 
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SQL. RelatedUrlDir (this, dirld) ; 

if (_ht.size() > 0) { 

_rurls ta new RelatedUrl [_ht . size ( } ] ; 
Enumeration el ems = _ht .elements () ; 
int i - 0; 

while (el ems .hasMoreEl entente () ) { 

RelatedUrl rurl o (RelatedUrl) elems .nextElement () ; 
_rurlsli++] = rurl; 

} 

sort ( > ; 
} else 

_rurls o null; 

} 

private void sortO { 
int i, j; 

for (i o 0; i < _rurls . length- 1; i++) { 
for (j - i+l; j < _rurls. length; { 
if (__mrls (i] .matchCount (> < _rurlB I j) .matchCount () ) { 

RelatedUrl swap - _rurls [i] ; 

_rurls li] - _rurls Cj 1 ; 

— rurlslj] o swap/ 



} 
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/*$Id; RelatedUrlGenerate. java, v 1.5 Exp $ */ 

// Author: David Siegel 

// 

package Blinkutil; 

import j a va . io . * ; 

import: java.lang.*; 

import j ava . ut i 1 . * ; 

import j ava .util .Date; 

import j ava . text . * ; 

import java.sql.*; 

import java . sql . SQLSxception; 

public class Re 1 a tedurl Generate { 

class Item { 

private int _urlld; 
private int _count? 

public ltem(int urlld) { 
_urlld = urlld; 
count s 0 ; 

} " 

public int urlldO { return _ urlld; } 
public int count {) { return _count; } 
public void increment () { count ++; ) 

) 

Hashtable _ht; 

public RelatedUrlGenerate ( ) ( 
_ht = null; 

} 

public void add (ResultSet rs) throws SQLException { 
int raatchurlld « rs .getlnt ( »url_id D ) ; 
Item item « ( Item) _ht .get (new Integer (mat chUr lid) ) ; 
if (item »=» null) { 

item = new Item < mat chUr lid) ; 
ht. put (new Integer ( ma tchUrl Id ) , item); 

} " 

item. increment ( ) ; 



[0 0 6 7J 



J 



(45) &m 2002-539559 



ffift I : I^V^A- Java y — K 



APPENDIX I: Sample Java Source Code 



public void update (int urlld) throws SQLException , Fatal Exception { 
_ht - new HaehtableO; 

SQL.RelatedUrlFindlthis, urlld> ; 

Enumeration elems = _ht . elements O ; 
while (elems .haeMoreBleroents () ) ( 

Item item = (item) elems .next Element () ; 

SQL. RelatedUrl Update (urlld, item. urlld () , item. count ()) ; 

) 
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Level 1: 

7 > 0.125 

10 > 0.1 

11 ---> 0.1 

12 > 0.3 

Level 2: 

1 ---> 0.08333333333333333 

2 > 0.125 

3 > 0.125 

5 > 0.06333333333333333 

9 > 0.08333333333333333 

15 > 0.0703125 

19 > 0.0703125 

22 > 0.0625 

23 > O. 0078125 

44 > 0.375 
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/* Sid: Embed. java,v 1.7 Exp $ */ 

// Author: David Siegel 

// 

Import com. blink. blink. Conf ig; 
import j ava . io . * ; 
import j ava . lang . * ; 
import java.util.*; 

import j ava .net . Mai f ormedURLBxc ep t ion ; 
import j ava . sql - SQLExcept ion ; 
import javax.servlet.*; 
import javax.servlet.http.*; 

import BlinkUtil.*; 

public class Embed extends HttpServlet { 

private static Session _s ess ion; 
private State _state; 
private int count a 0; 

public void init (Serv let Conf ig servletConf ig) throws ServletBxception { 
super. init (servlet Conf ig) ; 
try { 

Conf ig . load ( ) ; 
} catch (IOBxception e) { 

throw new ServletBxception ( "Can' t load configuration data:" + 
e . getMessage ( ) ) ; 

} 

Log. init 0 ,- 

_state State. gets tate ( ) ; 

^session = new Session {null , null, null, null); 
Config config - Conf ig.getConf ig {) ? 

_ session. dispatch tconf ig.get ( "html .url . server . root") + 
conf ig . get ( n html . url . run " ) ) ; 

} 

private String fmt (String html) { 
html = Page* quo teQuote (html) ; 

return "document .write (\ n » + html + "N");^*; 

} 

public void service (HttpServletRequest req, HttpServletResponse reB) 
throws IOBxception, ServletBxception { 
ServletOutputStream out » res .get Outputs t ream () ; 
res . setContentType ( "text /html " ) ; 

String cmd = req. get Parameter ("cmd") ; 

if (cmd. equals ("gen") ) { 

String dirldStr » req. get Parameter ("dir n > ; 
String options - req . get Parameter ( n opt " ) ; 
try { 

EmbedXinks e « new CmbedLinks ( session) ; 
String str « e .html (dirldStr, options); 
if (Log. Debug) Log. log (Log. Dispatch, fmt (str)); 
out. print In (fmt (str) ) ; 
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} catch (Exception e) { 

out. print In (f rat {"Folder not available")); 

if (Log.Syslog) Log . log (Log . Bmbed, "Embed Folder (" + dirldStr + 
", " + options + ") gotr" ♦ e . getMesaage ( ) ) ; 

} 

} else if (cmd. equals ("hit") ) { 

String urlldStr = req.getPararoeterCurl") ; 
String dirldStr = req.getParameter ("dir") ; 
try { 

int urlld = Page. getld (urlldStr, »url»); 

int dirld = Page. getld (dirldStr. "dir"); 

Url url = _session.getUrl (urlld, dirld); 

url.hit(dirXd) ,- 

res . sendRedirect (url .href ( I ) ; 

} catch (Exception e) { 

out .print In (fmt ("Cannot launch URL")); 

if (Log.Syslog) Log. log (Log. Bmbed, "Bmbed hic(" + urlldStr + "," + 
dirldStr + ") got:" + e. getMesaage () ) ; 

} 

} 
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